| Parameter | Value |
total_samples | 10000000 |
batch_size | 8 |
stage_samples_multiplier | 100000000000 |
update_interval | 250 |
window_size | 100 |
num_best_models_to_keep | 1 |
sampling_mode | Loss-weighted |
loss_weight_temperature | 0.5 |
loss_weight_refresh_interval | 50 |
stop_on_divergence | True |
divergence_gap | 0.002 |
divergence_ratio | 1.5 |
divergence_patience | 50 |
divergence_min_updates | 10 |
val_spike_threshold | 2.0 |
val_spike_window | 15 |
val_spike_frequency | 0.75 |
val_plateau_patience | 250 |
val_plateau_min_delta | 0.0001 |
custom_lr | 0.0001 |
disable_lr_scaling | True |
custom_warmup | -1 |
lr_min_ratio | 0.001 |
resume_warmup_ratio | 0.05 |
plateau_factor | 0.8 |
plateau_patience | 15 |
preserve_optimizer | False |
preserve_scheduler | True |
samples_mode | Train additional samples |
num_random_obs_to_visualize | 2 |
selected_frame_offset | 3 |
runs_per_stage | 5 |
serial_runs | True |
clean_old_checkpoints | True |
enable_baseline | False |
baseline_runs_per_stage | 1 |
run_id | shoulder_session_multiheight_large_decoder |
enable_wandb | True |
wandb_project | developmental-robot-movement |
lr_sweep.lr_min | 1e-07 |
lr_sweep.lr_max | 0.01 |
lr_sweep.phase_a_num_candidates | 5 |
lr_sweep.phase_a_seeds | 1 |
lr_sweep.phase_a_time_budget_min | 3.0 |
lr_sweep.phase_a_survivor_count | 2 |
lr_sweep.phase_b_seeds | 3 |
lr_sweep.phase_b_time_budget_min | 10.0 |
lr_sweep.ranking_metric | median_best_val |
lr_sweep.min_samples_before_timeout | 1000 |
lr_sweep.min_evals_before_stop | 5 |
lr_sweep.save_sweep_state | True |
plateau_sweep.enabled | True |
plateau_sweep.plateau_ema_alpha | 0.85 |
plateau_sweep.plateau_improvement_threshold | 0.0015 |
plateau_sweep.plateau_patience | 25 |
plateau_sweep.cooldown_updates | 5 |
plateau_sweep.max_sweeps_per_stage | 2 |
plateau_sweep.min_sweep_improvement | 0.0 |
initial_sweep_enabled | True |
stage_time_budget_min | 180 |